PyPI - edwh-editorjs - Versions diffs - 1.0.1__py3-none-any.whl → 2.0.0__py3-none-any.whl - Mend

edwh-editorjs 1.0.1py3-none-any.whl → 2.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

editorjs/__about__.py +1 -0
editorjs/__init__.py +5 -0
editorjs/blocks.py +670 -0
editorjs/core.py +119 -0
editorjs/exceptions.py +3 -0
editorjs/helpers.py +5 -0
editorjs/types.py +43 -0
edwh_editorjs-2.0.0.dist-info/METADATA +28 -0
edwh_editorjs-2.0.0.dist-info/RECORD +11 -0
{edwh_editorjs-1.0.1.dist-info → edwh_editorjs-2.0.0.dist-info}/licenses/LICENSE +1 -0
edwh_editorjs-1.0.1.dist-info/METADATA +0 -73
edwh_editorjs-1.0.1.dist-info/RECORD +0 -9
pyeditorjs/__about__.py +0 -1
pyeditorjs/__init__.py +0 -28
pyeditorjs/blocks.py +0 -309
pyeditorjs/exceptions.py +0 -19
pyeditorjs/parser.py +0 -75
{edwh_editorjs-1.0.1.dist-info → edwh_editorjs-2.0.0.dist-info}/WHEEL +0 -0

editorjs/__about__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "2.0.0"

editorjs/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+from .core import EditorJS
+__all__ = [
+    "EditorJS",
+]

editorjs/blocks.py ADDED Viewed

@@ -0,0 +1,670 @@
+"""
+mdast to editorjs
+"""
+import abc
+import re
+import typing as t
+from html.parser import HTMLParser
+from urllib.parse import urlparse
+import markdown2
+from .exceptions import TODO
+from .types import EditorChildData, MDChildNode
+class EditorJSBlock(abc.ABC):
+    @classmethod
+    @abc.abstractmethod
+    def to_markdown(cls, data: EditorChildData) -> str: ...
+    @classmethod
+    @abc.abstractmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]: ...
+    @classmethod
+    @abc.abstractmethod
+    def to_text(cls, node: MDChildNode) -> str: ...
+BLOCKS: dict[str, EditorJSBlock] = {}
+def block(*names: str):
+    def wrapper(cls):
+        for name in names:
+            BLOCKS[name] = cls
+        return cls
+    return wrapper
+def process_styled_content(item: MDChildNode, strict: bool = True) -> str:
+    """
+    Processes styled content (e.g., bold, italic) within a list item.
+    Args:
+        item: A ChildNode dictionary representing an inline element or text.
+        strict: Raise if 'type' is not one defined in 'html_wrappers'
+    Returns:
+        A formatted HTML string based on the item type.
+    """
+    _type = item.get("type")
+    html_wrappers = {
+        "text": "{value}",
+        "html": "{value}",
+        "emphasis": "<i>{value}</i>",
+        "strong": "<b>{value}</b>",
+        "strongEmphasis": "<b><i>{value}</i></b>",
+        "link": '<a href="{url}">{value}</a>',
+        "inlineCode": '<code class="inline-code">{value}</code>',
+        # todo: <mark>, linktool
+    }
+    if _type in BLOCKS:
+        return BLOCKS[_type].to_text(item)
+    if strict and _type not in html_wrappers:
+        raise ValueError(f"Unsupported type {_type} in paragraph")
+    # Process children recursively if they exist, otherwise use the direct value
+    if children := item.get("children"):
+        value = "".join(process_styled_content(child) for child in children)
+    else:
+        value = item.get("value", "")
+    template = html_wrappers.get(_type, "{value}")
+    return template.format(
+        value=value, url=item.get("url", ""), caption=item.get("caption", "")
+    )
+def default_to_text(node: MDChildNode):
+    return "".join(
+        process_styled_content(child) for child in node.get("children", [])
+    ) or process_styled_content(node)
+@block("heading", "header")
+class HeadingBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        level = data.get("level", 1)
+        text = data.get("text", "")
+        if not (1 <= level <= 6):
+            raise ValueError("Header level must be between 1 and 6.")
+        return f"{'#' * level} {text}\n"
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        """
+        Converts a Markdown header block into structured block data.
+        Args:
+            node: A RootNode dictionary with 'depth' and 'children'.
+        Returns:
+            A ChildNode dictionary representing the header data, or None if no children exist.
+        Raises:
+            ValueError: If an unsupported heading depth is provided.
+        """
+        depth = node.get("depth")
+        if depth is None or not (1 <= depth <= 6):
+            raise ValueError("Heading depth must be between 1 and 6.")
+        return [{"data": {"level": depth, "text": cls.to_text(node)}, "type": "header"}]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        children = node.get("children", [])
+        if children is None or not len(children) == 1:
+            raise ValueError("Header block must have exactly one child element")
+        child = children[0]
+        return child.get("value", "")
+@block("paragraph")
+class ParagraphBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        text = data.get("text", "")
+        return f"{text}\n"
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        result = []
+        current_text = ""
+        skip = 0
+        nodes = node.get("children", [])
+        for idx, child in enumerate(nodes):
+            if skip:
+                skip -= 1
+                continue
+            _type = child.get("type")
+            # deal with custom types
+            if _type == "html" and child.get("value", "").startswith("<editorjs"):
+                # special type, e.g. <editorjs type="linkTool" href=...>...</editorjs>
+                if child.get("value", "").endswith("/>"):
+                    # self-closing
+                    result.append(EditorJSCustom.to_json(node))
+                    continue
+                else:
+                    # <editorjs>something</editorjs> = 3 children
+                    result.extend(
+                        EditorJSCustom.to_json({"children": nodes[idx : idx + 2]})
+                    )
+                    skip = 2
+                    continue
+            elif _type == "image":
+                if current_text:
+                    result.append({"data": {"text": current_text}, "type": "paragraph"})
+                    current_text = ""
+                result.extend(ImageBlock.to_json(child))
+            else:
+                child_text = cls.to_text(child)
+                _child_text = child_text.strip()
+                if _child_text.startswith("|") and _child_text.endswith("|"):
+                    # note: this just supports text-only tables.
+                    # tables with more complex elements break into multiple children.
+                    # and mdast DOES support converting into a Table/TableCell structure
+                    # via the GFM exttension
+                    # but their default mdast->md converter does NOT implement these functionalities.
+                    result.extend(TableBlock.to_json(child))
+                    continue
+                current_text += child_text
+        # final text after image:
+        if current_text:
+            result.append({"data": {"text": current_text}, "type": "paragraph"})
+        return result
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        return default_to_text(node)
+@block("list")
+class ListBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        style = data.get("style", "unordered")
+        items = data.get("items", [])
+        def parse_items(subitems: list[dict[str, t.Any]], depth: int = 0) -> str:
+            markdown_items = []
+            for index, item in enumerate(subitems):
+                prefix = f"{index + 1}." if style == "ordered" else "-"
+                line = f"{'\t' * depth}{prefix} {item['content']}"
+                markdown_items.append(line)
+                # Recurse if there are nested items
+                if item.get("items"):
+                    markdown_items.append(parse_items(item["items"], depth + 1))
+            return "\n".join(markdown_items)
+        return "\n" + parse_items(items) + "\n\n"
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        """
+        Converts a Markdown list block with nested items and styling into structured block data.
+        Args:
+            node: A RootNode dictionary with 'ordered' and 'children'.
+        Returns:
+            A dictionary representing the structured list data with 'items' and 'style'.
+        """
+        items = []
+        # checklists are not supported (well) by mdast
+        # so we detect it ourselves:
+        could_be_checklist = True
+        def is_checklist(value: str) -> bool:
+            return value.strip().startswith(("[ ]", "[x]"))
+        for child in node["children"]:
+            content = ""
+            subitems = []
+            # child can have content and/or items
+            for grandchild in child["children"]:
+                _type = grandchild.get("type", "")
+                if _type == "paragraph":
+                    subcontent = ParagraphBlock.to_text(grandchild)
+                    could_be_checklist = could_be_checklist and is_checklist(subcontent)
+                    content += "" + subcontent
+                elif _type == "list":
+                    could_be_checklist = False
+                    subitems.extend(ListBlock.to_json(grandchild)[0]["data"]["items"])
+                else:
+                    raise ValueError(f"Unsupported type {_type} in list")
+            items.append(
+                {
+                    "content": content,
+                    "items": subitems,
+                }
+            )
+        # todo: detect 'checklist':
+        """
+        type: checklist
+        data: {items: [{text: "a", checked: false}, {text: "b", checked: false}, {text: "c", checked: true},…]}
+        """
+        if could_be_checklist:
+            return [
+                {
+                    "type": "checklist",
+                    "data": {
+                        "items": [
+                            {
+                                "text": x["content"]
+                                .removeprefix("[ ] ")
+                                .removeprefix("[x] "),
+                                "checked": x["content"].startswith("[x]"),
+                            }
+                            for x in items
+                        ]
+                    },
+                }
+            ]
+        else:
+            return [
+                {
+                    "data": {
+                        "items": items,
+                        "style": "ordered" if node.get("ordered") else "unordered",
+                    },
+                    "type": "list",
+                }
+            ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        return ""
+@block("checklist")
+class ChecklistBlock(ListBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        markdown_items = []
+        for item in data.get("items", []):
+            text = item.get("text", "").strip()
+            char = "x" if item.get("checked", False) else " "
+            markdown_items.append(f"- [{char}] {text}")
+        return "\n" + "\n".join(markdown_items) + "\n\n"
+@block("thematicBreak", "delimiter")
+class DelimiterBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        return "***\n"
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        return [
+            {
+                "type": "delimiter",
+                "data": {},
+            }
+        ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        return ""
+@block("code")
+class CodeBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        code = data.get("code", "")
+        return f"```\n" f"{code}" f"\n```\n"
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        return [
+            {
+                "data": {"code": cls.to_text(node)},
+                "type": "code",
+            }
+        ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        return node.get("value", "")
+@block("image")
+class ImageBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        url = data.get("url", "") or data.get("file", {}).get("url", "")
+        caption = data.get("caption", "")
+        return f"""![{caption}]({url} "{caption}")\n"""
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        return [
+            {
+                "type": "image",
+                "data": {
+                    "caption": cls.to_text(node),
+                    "file": {"url": node.get("url")},
+                },
+            }
+        ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        return node.get("alt") or node.get("caption") or ""
+@block("blockquote", "quote")
+class QuoteBlock(EditorJSBlock):
+    re_cite = re.compile(r"<cite>(.+?)<\/cite>")
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        text = data.get("text", "")
+        result = f"> {text}\n"
+        if caption := data.get("caption", ""):
+            result += f"> <cite>{caption}</cite>\n"
+        return result
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        caption = ""
+        text = cls.to_text(node).replace("\n", "<br/>\n")
+        if cite := re.search(cls.re_cite, text):
+            # Capture the value of the first group
+            caption = cite.group(1)
+            # Remove the <cite>...</cite> tags from the text
+            text = re.sub(cls.re_cite, "", text)
+        return [
+            {
+                "data": {
+                    "alignment": "left",
+                    "caption": caption,
+                    "text": text,
+                },
+                "type": "quote",
+            }
+        ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        return default_to_text(node)
+@block("raw")
+class RawBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        return data.get("html", "")
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        raise TODO(node)
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        raise TODO(node)
+@block("table")
+class TableBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        """
+        | Script | Interpreter | User | System |   |
+        |--------|-------------|------|--------|---|
+        |        |             |      |        |   |
+        |        |             |      |        |   |
+        |        |             |      |        |   |
+        """
+        table = ""
+        rows = data.get("content", [])
+        # Add an empty header row if no headings are provided
+        if not data.get("withHeadings", False) and rows:
+            table += "| " + " | ".join([""] * len(rows[0])) + " |\n"
+            table += "|" + " - |" * len(rows[0]) + "\n"
+        # Populate rows
+        for idx, tr in enumerate(rows):
+            table += "| " + " | ".join(tr) + " |\n"
+            # Add separator if headings are enabled and it's the first row
+            if not idx and data.get("withHeadings", False):
+                table += "|" + " - |" * len(tr) + "\n"
+        return f"\n{table}\n"
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        # content":[["Yeah","Okay"],["<i>1</i>","<code class=\"inline-code\">2</code>"]]}}]
+        table = []
+        with_headings = False
+        # first row is headings or empty. If not empty, withHeadings is True
+        # second row must be ignored
+        for idx, row in enumerate(node.get("value", "").strip().split("\n")):
+            tr = [_.strip() for _ in row.split("|")[1:-1]]
+            if not idx:
+                # first
+                if any(tr):
+                    with_headings = True
+                    table.append(tr)
+            elif idx == 1:
+                continue
+            else:
+                table.append(tr)
+        return [
+            {
+                "type": "table",
+                "content": table,
+                "withHeadings": with_headings,
+            }
+        ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        raise TODO(node)
+@block("linkTool")
+class LinkBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        link = data.get("link", "")
+        meta = data.get("meta", {})
+        title = meta.get("title", "")
+        description = meta.get("description", "")
+        image = meta.get("image", {}).get("url", "")
+        return f"""<editorjs type="linkTool" href="{link}" title="{title}" image="{image}">{description}</editorjs>"""
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        return [
+            {
+                "type": "linkTool",
+                "data": {
+                    "link": node.get("href", ""),
+                    "meta": {
+                        "title": node.get("title", ""),
+                        "description": node.get("body", ""),
+                        "image": {
+                            "url": node.get("image", ""),
+                        },
+                    },
+                },
+            }
+        ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        url = node.get("href", "")
+        image = node.get("image", "")
+        title = node.get("title", "")
+        body = node.get("body", "")
+        domain = urlparse(url).netloc
+        return f"""
+        <div class="link-tool">
+            <a class="link-tool__content link-tool__content--rendered" target="_blank"
+               rel="nofollow noindex noreferrer" href="{url}">
+                <div class="link-tool__image"
+                     style="background-image: url(&quot;{image}&quot;);"></div>
+                <div class="link-tool__title">{title}</div>
+                <p class="link-tool__description">{body}</p>
+                <span class="link-tool__anchor">{domain}</span>
+            </a>
+        </div>
+        """
+@block("attaches")
+class AttachmentBlock(EditorJSBlock):
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        file = data.get("file", {}).get("url", "")
+        title = data.get("title", "")
+        return f"""<editorjs type="attaches" file="{file}">{title}</editorjs>"""
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        return [
+            {
+                "type": "attaches",
+                "data": {
+                    "file": {"url": node.get("file", "")},
+                    "title": node.get("body", ""),
+                },
+            }
+        ]
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        return f"""
+        <div class="cdx-attaches cdx-attaches--with-file">
+            <div class="cdx-attaches__file-icon">
+                <div class="cdx-attaches__file-icon-background">
+                    <svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24"><path stroke="currentColor" stroke-linecap="round" stroke-linejoin="round" stroke-width="2" d="M13.3236 8.43554L9.49533 12.1908C9.13119 12.5505 8.93118 13.043 8.9393 13.5598C8.94741 14.0767 9.163 14.5757 9.53862 14.947C9.91424 15.3182 10.4191 15.5314 10.9422 15.5397C11.4653 15.5479 11.9637 15.3504 12.3279 14.9908L16.1562 11.2355C16.8845 10.5161 17.2845 9.53123 17.2682 8.4975C17.252 7.46376 16.8208 6.46583 16.0696 5.72324C15.3184 4.98066 14.3086 4.55425 13.2624 4.53782C12.2162 4.52138 11.2193 4.91627 10.4911 5.63562L6.66277 9.39093C5.57035 10.4699 4.97032 11.9473 4.99467 13.4979C5.01903 15.0485 5.66578 16.5454 6.79264 17.6592C7.9195 18.7731 9.43417 19.4127 11.0034 19.4374C12.5727 19.462 14.068 18.8697 15.1604 17.7907L18.9887 14.0354"></path></svg>
+                </div>
+            </div>
+            <div class="cdx-attaches__file-info">
+                <div class="cdx-attaches__title" data-placeholder="File title" data-empty="false">
+                {node.get("body", "")}
+                </div>
+            </div>
+            <a class="cdx-attaches__download-button" href="{node.get('file', '')}" target="_blank" rel="nofollow noindex noreferrer">
+                <svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="none" viewBox="0 0 24 24"><path stroke="currentColor" stroke-linecap="round" stroke-width="2" d="M7 10L11.8586 14.8586C11.9367 14.9367 12.0633 14.9367 12.1414 14.8586L17 10"></path></svg>
+            </a>
+        </div>
+        """
+class AttributeParser(HTMLParser):
+    def __init__(self):
+        super().__init__()
+        self.attributes = {}
+        self.data = None
+    def handle_starttag(self, tag, attrs):
+        # Collect attributes when the tag is encountered
+        self.attributes = dict(attrs)
+    def handle_data(self, data):
+        self.data = data
+class EditorJSCustom(EditorJSBlock, markdown2.Extra):
+    """
+    Special type of block to deal with custom attributes
+    """
+    name = "editorjs"
+    order = (), (markdown2.Stage.POSTPROCESS,)
+    @classmethod
+    def parse_html(cls, html: str):
+        parser = AttributeParser()
+        parser.feed(html)
+        return parser.attributes, parser.data
+    @classmethod
+    def to_markdown(cls, data: EditorChildData) -> str:
+        raise TODO()
+    @classmethod
+    def to_json(cls, node: MDChildNode) -> list[dict]:
+        html = "".join(_["value"] for _ in node.get("children", []))
+        attrs, body = cls.parse_html(html)
+        _type = attrs.get("type", "")
+        attrs.setdefault("body", body)  # only if there is no such attribute yet
+        if not (handler := BLOCKS.get(_type)):
+            raise ValueError(f"Unknown custom type {_type}")
+        return handler.to_json(attrs)
+    @classmethod
+    def to_text(cls, node: MDChildNode) -> str:
+        raise TODO()
+    # markdown2:
+    re_short = re.compile(r"<editorjs.*?/>")
+    re_long = re.compile(r"<editorjs.*?>.*?</editorjs>")
+    def run(self, text: str) -> str:
+        def replace_html(match):
+            attrs, body = self.parse_html(match.group())
+            _type = attrs.get("type", "")
+            attrs.setdefault("body", body)  # only if there is no such attribute yet
+            if not (handler := BLOCKS.get(_type)):
+                raise ValueError(f"Unknown custom type {_type}")
+            return handler.to_text(attrs)
+        # Substitute using the replacement functions
+        text = self.re_long.sub(replace_html, text)
+        text = self.re_short.sub(replace_html, text)
+        return text
+EditorJSCustom.register()

edwh-editorjs 1.0.1__py3-none-any.whl → 2.0.0__py3-none-any.whl

edwh-editorjs 1.0.1py3-none-any.whl → 2.0.0py3-none-any.whl